import os
import cv2
import numpy as np
import pytesseract
from PIL import Image
def get_img(input_dir):
    img_paths = []
    for (path,dirname,filenames) in os.walk(input_dir):
        for filename in filenames:
            img_paths.append(path+'/'+filename)
    print("img_paths:",img_paths)
    return img_paths

def cut_img(img_paths):
    scale = len(img_paths)
    f = open('text.txt', 'w+', encoding='utf-8')
    for i,img_path in enumerate(img_paths):
        # 遍历读取图片
        im = Image.open(img_path)
        # 识别数字
        string = pytesseract.image_to_string(im,lang="chi_sim+eng")
        f.write('\n-------------------------')
        print(string)
        f.write(string + '\n\n')

    f.close()    

if __name__ == '__main__':
    input_dir = "img_cut/"                # 读取图片目录表
    img_paths = get_img(input_dir)
    print('图片获取完成 。。。！')
    cut_img(img_paths)